export CUDA_DEVICE_ORDER=PCI_BUS_ID 
export CUDA_VISIBLE_DEVICES=5
python -m vllm.entrypoints.openai.api_server \
	    --host=127.0.0.1 \
	        --port=8989 \
		    --model=/file/ljw22/Qwen2.5-7B-Instruct \
		        --tokenizer=/file/ljw22/Qwen2.5-7B-Instruct
